
#export CUDA_VISIBLE_DEVICES=0
# qwen 1.8b fp16
#vllm serve /root/yuehu/assets/Qwen2.5-1.5B-Instruct --port 8000 > log.1.8b.txt 2>&1 &

# export CUDA_VISIBLE_DEVICES=2
# # qwen 7b int4
# vllm serve /root/yuehu/assets/Qwen2.5-7B-Instruct-AWQ --port 8081 > log.7b.txt 2>&1 &

export CUDA_VISIBLE_DEVICES=3
# qwen 7b int4
vllm serve /root/yuehu/assets/Qwen2.5-7B-Instruct --port 8082 > log.7b.txt 2>&1 &
